<!DOCTYPE html>
<html lang="zh-CN">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>LMArena - 开源AI模型评估平台</title>
    <link href="https://cdn.staticfile.org/font-awesome/6.4.0/css/all.min.css" rel="stylesheet">
    <link href="https://cdn.staticfile.org/tailwindcss/2.2.19/tailwind.min.css" rel="stylesheet">
    <link href="https://fonts.googleapis.com/css2?family=Noto+Serif+SC:wght@400;500;600;700&family=Noto+Sans+SC:wght@300;400;500;700&display=swap" rel="stylesheet">
    <script src="https://cdn.jsdelivr.net/npm/mermaid@latest/dist/mermaid.min.js"></script>
    <style>
        body {
            font-family: 'Noto Sans SC', Tahoma, Arial, Roboto, "Droid Sans", "Helvetica Neue", "Droid Sans Fallback", "Heiti SC", "Hiragino Sans GB", Simsun, sans-serif;
        }
        .serif-font {
            font-family: 'Noto Serif SC', serif;
        }
        .gradient-text {
            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
            -webkit-background-clip: text;
            -webkit-text-fill-color: transparent;
            background-clip: text;
        }
        .hero-gradient {
            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
        }
        .card-hover {
            transition: all 0.3s ease;
        }
        .card-hover:hover {
            transform: translateY(-4px);
            box-shadow: 0 20px 40px rgba(0,0,0,0.1);
        }
        .feature-icon {
            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
            -webkit-background-clip: text;
            -webkit-text-fill-color: transparent;
            background-clip: text;
        }
        .drop-cap::first-letter {
            float: left;
            font-size: 4rem;
            line-height: 3rem;
            padding-right: 0.5rem;
            margin-top: 0.5rem;
            font-weight: 700;
            color: #667eea;
        }
        .mermaid {
            display: flex;
            justify-content: center;
            margin: 2rem 0;
        }
    </style>
</head>
<body class="bg-gray-50">
    <!-- Hero Section -->
    <section class="hero-gradient text-white py-20 px-6">
        <div class="max-w-6xl mx-auto">
            <div class="text-center">
                <h1 class="text-5xl md:text-7xl font-bold mb-6 serif-font">LMArena</h1>
                <p class="text-xl md:text-2xl mb-8 opacity-90">开源AI模型评估平台</p>
                <p class="text-lg max-w-3xl mx-auto leading-relaxed opacity-80">
                    通过人类偏好评估大型语言模型，让AI选择变得简单而可靠
                </p>
                <div class="mt-10 flex justify-center space-x-4">
                    <a href="https://lmarena.ai/" target="_blank" class="bg-white text-purple-700 px-8 py-3 rounded-full font-semibold hover:bg-gray-100 transition">
                        <i class="fas fa-external-link-alt mr-2"></i>访问平台
                    </a>
                    <a href="#features" class="border-2 border-white px-8 py-3 rounded-full font-semibold hover:bg-white hover:text-purple-700 transition">
                        了解更多
                    </a>
                </div>
            </div>
        </div>
    </section>

    <!-- Introduction Section -->
    <section class="py-16 px-6">
        <div class="max-w-4xl mx-auto">
            <div class="bg-white rounded-2xl shadow-xl p-10">
                <h2 class="text-3xl font-bold mb-6 serif-font">平台简介</h2>
                <p class="text-lg leading-relaxed text-gray-700 drop-cap">
                    LMArena是一个革命性的开源平台，专为评估大型语言模型而设计。它通过匿名比较多个AI模型的响应质量，生成透明的排行榜，帮助研究人员、开发者、产品经理和AI爱好者在快速演变的LLM景观中做出明智选择。
                </p>
                <div class="mt-8 grid grid-cols-1 md:grid-cols-3 gap-6">
                    <div class="text-center">
                        <i class="fas fa-users text-4xl feature-icon mb-3"></i>
                        <h3 class="font-semibold text-lg">社区驱动</h3>
                        <p class="text-gray-600 mt-2">众包评估，集体智慧</p>
                    </div>
                    <div class="text-center">
                        <i class="fas fa-chart-line text-4xl feature-icon mb-3"></i>
                        <h3 class="font-semibold text-lg">实时更新</h3>
                        <p class="text-gray-600 mt-2">动态排行榜，紧跟趋势</p>
                    </div>
                    <div class="text-center">
                        <i class="fas fa-code-branch text-4xl feature-icon mb-3"></i>
                        <h3 class="font-semibold text-lg">完全开源</h3>
                        <p class="text-gray-600 mt-2">透明可信，社区共建</p>
                    </div>
                </div>
            </div>
        </div>
    </section>

    <!-- Problem Solution Section -->
    <section class="py-16 px-6 bg-gray-100">
        <div class="max-w-6xl mx-auto">
            <h2 class="text-4xl font-bold text-center mb-12 serif-font">解决的核心问题</h2>
            <div class="grid grid-cols-1 md:grid-cols-2 gap-8">
                <div class="bg-white rounded-xl p-8 card-hover">
                    <div class="flex items-start">
                        <i class="fas fa-exclamation-triangle text-3xl text-red-500 mr-4 mt-1"></i>
                        <div>
                            <h3 class="text-xl font-bold mb-3">传统基准测试的局限</h3>
                            <p class="text-gray-700 leading-relaxed">
                                静态基准如GLUE或MMLU容易被模型"作弊"优化，无法反映真实世界性能。主观评估依赖专家，成本高且存在偏差。
                            </p>
                        </div>
                    </div>
                </div>
                <div class="bg-white rounded-xl p-8 card-hover">
                    <div class="flex items-start">
                        <i class="fas fa-check-circle text-3xl text-green-500 mr-4 mt-1"></i>
                        <div>
                            <h3 class="text-xl font-bold mb-3">创新解决方案</h3>
                            <p class="text-gray-700 leading-relaxed">
                                通过众包匿名战斗和Elo评分系统，提供动态、基于人类判断的排行榜，确保评估的客观性和实用性。
                            </p>
                        </div>
                    </div>
                </div>
            </div>
        </div>
    </section>

    <!-- Core Features Section -->
    <section id="features" class="py-16 px-6">
        <div class="max-w-6xl mx-auto">
            <h2 class="text-4xl font-bold text-center mb-12 serif-font">核心功能</h2>
            <div class="grid grid-cols-1 md:grid-cols-2 lg:grid-cols-3 gap-8">
                <div class="bg-white rounded-xl shadow-lg p-8 card-hover">
                    <i class="fas fa-user-secret text-4xl feature-icon mb-4"></i>
                    <h3 class="text-xl font-bold mb-3">匿名模型战斗</h3>
                    <p class="text-gray-700">用户输入提示后，随机收到两个模型的响应进行盲选投票，确保公平比较。</p>
                </div>
                <div class="bg-white rounded-xl shadow-lg p-8 card-hover">
                    <i class="fas fa-images text-4xl feature-icon mb-4"></i>
                    <h3 class="text-xl font-bold mb-3">多模态竞技场</h3>
                    <p class="text-gray-700">支持文本、图像生成、视觉理解等不同领域，覆盖从聊天到多媒体生成的全面场景。</p>
                </div>
                <div class="bg-white rounded-xl shadow-lg p-8 card-hover">
                    <i class="fas fa-trophy text-4xl feature-icon mb-4"></i>
                    <h3 class="text-xl font-bold mb-3">实时Elo排行榜</h3>
                    <p class="text-gray-700">基于投票计算模型分数，持续更新，支持置信区间显示，快速识别顶级模型。</p>
                </div>
                <div class="bg-white rounded-xl shadow-lg p-8 card-hover">
                    <i class="fas fa-database text-4xl feature-icon mb-4"></i>
                    <h3 class="text-xl font-bold mb-3">开源数据集共享</h3>
                    <p class="text-gray-700">收集并公开人类偏好数据，包括数百万投票记录，促进AI社区协作。</p>
                </div>
                <div class="bg-white rounded-xl shadow-lg p-8 card-hover">
                    <i class="fas fa-sliders-h text-4xl feature-icon mb-4"></i>
                    <h3 class="text-xl font-bold mb-3">风格控制与偏见校正</h3>
                    <p class="text-gray-700">调整响应风格以减少人类偏见影响，使用logistic回归分解偏好因素。</p>
                </div>
                <div class="bg-white rounded-xl shadow-lg p-8 card-hover">
                    <i class="fas fa-shield-alt text-4xl feature-icon mb-4"></i>
                    <h3 class="text-xl font-bold mb-3">透明可信</h3>
                    <p class="text-gray-700">开源方法论包括身份泄露过滤，提升透明度和抗操纵性。</p>
                </div>
            </div>
        </div>
    </section>

    <!-- Workflow Visualization -->
    <section class="py-16 px-6 bg-gray-100">
        <div class="max-w-6xl mx-auto">
            <h2 class="text-4xl font-bold text-center mb-12 serif-font">工作流程</h2>
            <div class="bg-white rounded-2xl shadow-xl p-10">
                <div class="mermaid">
                    graph LR
                        A[用户输入提示] --> B[系统随机分配模型]
                        B --> C[模型A生成响应]
                        B --> D[模型B生成响应]
                        C --> E[匿名展示结果]
                        D --> E
                        E --> F[用户投票选择]
                        F --> G[更新Elo评分]
                        G --> H[实时排行榜]
                        H --> I[社区洞察]
                </div>
            </div>
        </div>
    </section>

    <!-- Use Cases Section -->
    <section class="py-16 px-6">
        <div class="max-w-6xl mx-auto">
            <h2 class="text-4xl font-bold text-center mb-12 serif-font">实际应用场景</h2>
            <div class="space-y-8">
                <div class="bg-white rounded-xl shadow-lg p-8">
                    <div class="flex items-start">
                        <i class="fas fa-code text-3xl text-purple-600 mr-4 mt-1"></i>
                        <div>
                            <h3 class="text-2xl font-bold mb-3">开发者场景</h3>
                            <p class="text-gray-700 leading-relaxed">
                                AI开发者在构建聊天机器人时，可以输入典型用户查询，比较GPT-4o与Claude 3.5 Sonnet的响应，选择更一致的模型集成到应用中，从而减少后期调试时间。
                            </p>
                        </div>
                    </div>
                </div>
                <div class="bg-white rounded-xl shadow-lg p-8">
                    <div class="flex items-start">
                        <i class="fas fa-microscope text-3xl text-purple-600 mr-4 mt-1"></i>
                        <div>
                            <h3 class="text-2xl font-bold mb-3">研究者场景</h3>
                            <p class="text-gray-700 leading-relaxed">
                                研究人员评估图像生成模型时，可上传提示到视觉竞技场，投票比较DALL-E 3与Stable Diffusion的输出质量，形成数据集用于论文分析。
                            </p>
                        </div>
                    </div>
                </div>
                <div class="bg-white rounded-xl shadow-lg p-8">
                    <div class="flex items-start">
                        <i class="fas fa-briefcase text-3xl text-purple-600 mr-4 mt-1"></i>
                        <div>
                            <h3 class="text-2xl font-bold mb-3">产品经理场景</h3>
                            <p class="text-gray-700 leading-relaxed">
                                产品经理在评估LLM用于内容审核时，平台的多模态支持允许测试安全性和逻辑一致性，生成报告指导供应商选择。
                            </p>
                        </div>
                    </div>
                </div>
            </div>
        </div>
    